from pydantic import BaseModel


class GenerationResult(BaseModel):
    prefilling_time: float = 0.0
    generation_time: float = 0.0
    time_per_token_generation: float = 0.0
    total_tokens_generation: int = 0
    time_per_token_prefilling: float = 0.0
    total_tokens_prefilling: int = 0
    llm_response: str = ""
